LOCUS pDONR™/Zeo DISCLAIMER Certain terms are trademarks or registered trademarks of Invitrogen Corporation. See "Intellectual Property" in the Help file for more information. FEATURES Location/Qualifiers misc_feature complement(268..295) /note="rrnB T2 transcription termination sequence (c)" misc_feature complement(427..470) /note="rrnB T1 transcription termination sequence (c)" primer_bind 537..552 /note="M13 Forward (-20) priming site" misc_recomb 570..668 /label=attL1 /note="attL1" misc_recomb complement(2372..2468) /label=attL2 /note="attL2 (c)" misc_signal complement(2483..2502) /note="T7 Promoter/priming site (c)" primer_bind 2510..2526 /note="M13 Reverse priming site" gene 2639..3448 /note="Kanamycin resistance gene" rep_origin 3569..4242 /note="pUC origin" vector join(2380..4245,1..651) /source="pDONR%99221" /type="Donor Vector" misc_feature 669..691 /note="TEV site" source 692..2365 /organism="Homo sapiens" /mol_type="mRNA" /db_xref="taxon:9606" /clone="MGC:43305 IMAGE:5265475" /tissue_type="Testis" /clone_lib="NIH_MGC_97" /lab_host="DH10B" /note="Vector: pBluescriptR" gene 692..2365 /gene="GALNTL4" /gene_synonym=GalNAc-T15 /gene_synonym=GALNT15 /gene_synonym=GALNT18 /gene_synonym=MGC71806 /db_xref="GeneID:374378" /db_xref="HGNC:30488" CDS 692..2365 /dnas_title="UDP-N-acetyl-alpha-D-galactosamine:polypeptid e N-acetylgalactosaminyltransferase-like 4" /gene="GALNTL4" /gene_synonym=GalNAc-T15 /gene_synonym=GALNT15 /gene_synonym=GALNT18 /gene_synonym=MGC71806 /codon_start=1 /product="UDP-N-acetyl-alpha-D-galactosamine:polypeptide N-acetylgalactosaminyltransferase-like 4" /protein_id="AAH37341.3" /db_xref="GI:54673631" /db_xref="GeneID:374378" /db_xref="HGNC:30488" /translation="MVCTRKTKTLVSTCVILSGMTNIICLLYVGWVTNYIASVYVRGQ EPAPDKKLEEDKGDTLKIIERLDHLENVIKQHIQEAPAKPEEAEAEPFTDSSLFAHWG QELSPEGRRVALKQFQYYGYNAYLSDRLPLDRPLPDLRPSGCRNLSFPDSLPEVSIVF IFVNEALSVLLRSIHSAMERTPPHLLKEIILVDDNSSNEELKEKLTEYVDKVNSQKPG FIKVVRHSKQEGLIRSRVSGWRAATAPVVALFDAHVEFNVGWAEPVLTRIKENRKRII SPSFDNIKYDNFEIEEYPLAAQGFDWELWCRYLNPPKAWWKLENSTAPIRSPALIGCF IVDRQYFQEIGLLDEGMEVYGGENVELGIRVWQCGGSVEVLPCSRIAHIERAHKPYTE DLTAHVRRNALRVAEVWMDEFKSHVYMAWNIPQEDSGIDIGDITARKALRKQLQCKTF RWYLVSVYPEMRMYSDIIAYGVLQNSLKTDLCLDQGPDTENVPIMYICHGMTPQNVYY TSSQQIHVGILSPTVDDDDNRCLVDVNSRPRLIECSYAKAKRMKLHWQFSQGGPIQNR KSKRCLELQENSDLEFGFQLVLQKCSGQHWSITNVLRSLAS" misc_feature 692..2365 /note="GALNTL4 coding region" misc_difference 2359..2359 /gene="GALNTL4" /gene_synonym=GalNAc-T15 /gene_synonym=GALNT15 /gene_synonym=GALNT18 /gene_synonym=MGC71806 /note="'G' in cDNA is 'C' in the human genome; no amino acid change." ORIGIN 1 CTTTCCTGCG TTATCCCCTG ATTCTGTGGA TAACCGTATT ACCGCCTTTG AGTGAGCTGA 61 TACCGCTCGC CGCAGCCGAA CGACCGAGCG CAGCGAGTCA GTGAGCGAGG AAGCGGAAGA 121 GCGCCCAATA CGCAAACCGC CTCTCCCCGC GCGTTGGCCG ATTCATTAAT GCAGCTGGCA 181 CGACAGGTTT CCCGACTGGA AAGCGGGCAG TGAGCGCAAC GCAATTAATA CGCGTACCGC 241 TAGCCAGGAA GAGTTTGTAG AAACGCAAAA AGGCCATCCG TCAGGATGGC CTTCTGCTTA 301 GTTTGATGCC TGGCAGTTTA TGGCGGGCGT CCTGCCCGCC ACCCTCCGGG CCGTTGCTTC 361 ACAACGTTCA AATCCGCTCC CGGCGGATTT GTCCTACTCA GGAGAGCGTT CACCGACAAA 421 CAACAGATAA AACGAAAGGC CCAGTCTTCC GACTGAGCCT TTCGTTTTAT TTGATGCCTG 481 GCAGTTCCCT ACTCTCGCGT TAACGCTAGC ATGGATGTTT TCCCAGTCAC GACGTTGTAA 541 AACGACGGCC AGTCTTAAGC TCGGGCCCCA AATAATGATT TTATTTTGAC TGATAGTGAC 601 CTGTTCGTTG CAACACATTG ATGAGCAATG CTTTTTTATA ATGCCAACTT TGTACAAAAA 661 AGCAGGCTct gaaaacttgt actttcaagg caagaagctg gaggaagaca aaggggacac 721 tctgaagatt attgagcggc tggaccacct ggagaatgtc atcaagcagc acattcaaga 781 ggctcctgcc aagcctgagg aggcagaggc cgagcccttc acagactcct ctctgtttgc 841 acactggggc caggagctca gccccgaagg ccggcgcgtg gccctgaagc aattccagta 901 ctacggctac aacgcctacc tcagcgaccg cctgcccctg gaccggcccc tgcctgacct 961 cagacccagt gggtgccgta acctctcatt tcctgacagc ctgccagagg tgagcatcgt 1021 gttcatcttc gtcaatgaag cgctttcagt gctgctgcgc tccatccact cggccatgga 1081 acgcacgccc ccacatctgc tcaaggagat cattctggtg gatgacaaca gcagtaacga 1141 ggaactgaag gagaagctga ccgaatatgt ggacaaggtg aacagccaga agccaggctt 1201 catcaaagtc gtgcgtcaca gcaagcagga aggcctcatc cgctccaggg tcagtggctg 1261 gagggcggcc actgcccctg tggtggcact ctttgatgcc cacgtggagt tcaatgtggg 1321 ctgggctgaa cctgtactca cccgcatcaa ggagaaccgg aagcggatca tctcgccatc 1381 ctttgataac atcaaatatg acaactttga gatagaagag tacccgctgg ctgcccaggg 1441 ctttgactgg gagctgtggt gccgctacct aaatcccccc aaggcctggt ggaagctgga 1501 gaactccaca gcgccaatca ggagccctgc cctcattggc tgcttcattg tggaccggca 1561 gtacttccag gagatcggcc tgctggacga aggcatggaa gtctacgggg gcgagaatgt 1621 ggagcttggg atcagggtgt ggcagtgtgg cgggagtgtg gaggtcctgc cctgctcacg 1681 gattgcccac attgagcgag cccacaagcc ctacacagag gacctcaccg cccatgtccg 1741 caggaacgct ctcagggtgg ctgaagtctg gatggatgaa tttaaaagcc acgtctacat 1801 ggcatggaac ataccgcagg aggactcagg aattgacatt ggggacatca ctgcaaggaa 1861 ggctctcagg aaacagctgc agtgcaagac cttccggtgg tacctggtca gcgtgtaccc 1921 agagatgagg atgtactccg acatcattgc ctatggagtg ctgcagaatt ctctgaagac 1981 tgatttgtgt cttgaccagg ggccagatac agagaatgtc cccatcatgt acatctgcca 2041 tgggatgacg cctcagaacg tgtactacac gagcagtcag cagatccatg tgggcattct 2101 gagccccacc gtggatgatg atgacaaccg atgcctggtg gacgtcaaca gccggccccg 2161 gctcatcgaa tgcagctacg ccaaagccaa gaggatgaag cttcactggc agttctctca 2221 gggaggaccc atccagaacc gcaagtctaa gcgctgtctg gagctgcagg agaatagcga 2281 cctggagttc ggcttccagc tggtgttgca gaagtgctcg ggccagcact ggagcatcac 2341 caacgtcctg aggagcctgg cgtccTAGGA CCCAGCTTTC TTGTACAAAG TTGGCATTAT 2401 AAGAAAGCAT TGCTTATCAA TTTGTTGCAA CGAACAGGTC ACTATCAGTC AAAATAAAAT 2461 CATTATTTGC CATCCAGCTG ATATCCCCTA TAGTGAGTCG TATTACATGG TCATAGCTGT 2521 TTCCTGGCAG CTCTGGCCCG TGTCTCAAAA TCTCTGATGT TACATTGCAC AAGATAAAAT 2581 AATATCATCA TGAACAATAA AACTGTCTGC TTACATAAAC AGTAATACAA GGGGTGTTAT 2641 GAGCCATATT CAACGGGAAA CGTCGAGGCC GCGATTAAAT TCCAACATGG ATGCTGATTT 2701 ATATGGGTAT AAATGGGCTC GCGATAATGT CGGGCAATCA GGTGCGACAA TCTATCGCTT 2761 GTATGGGAAG CCCGATGCGC CAGAGTTGTT TCTGAAACAT GGCAAAGGTA GCGTTGCCAA 2821 TGATGTTACA GATGAGATGG TCAGACTAAA CTGGCTGACG GAATTTATGC CTCTTCCGAC 2881 CATCAAGCAT TTTATCCGTA CTCCTGATGA TGCATGGTTA CTCACCACTG CGATCCCCGG 2941 AAAAACAGCA TTCCAGGTAT TAGAAGAATA TCCTGATTCA GGTGAAAATA TTGTTGATGC 3001 GCTGGCAGTG TTCCTGCGCC GGTTGCATTC GATTCCTGTT TGTAATTGTC CTTTTAACAG 3061 CGATCGCGTA TTTCGTCTCG CTCAGGCGCA ATCACGAATG AATAACGGTT TGGTTGATGC 3121 GAGTGATTTT GATGACGAGC GTAATGGCTG GCCTGTTGAA CAAGTCTGGA AAGAAATGCA 3181 TAAACTTTTG CCATTCTCAC CGGATTCAGT CGTCACTCAT GGTGATTTCT CACTTGATAA 3241 CCTTATTTTT GACGAGGGGA AATTAATAGG TTGTATTGAT GTTGGACGAG TCGGAATCGC 3301 AGACCGATAC CAGGATCTTG CCATCCTATG GAACTGCCTC GGTGAGTTTT CTCCTTCATT 3361 ACAGAAACGG CTTTTTCAAA AATATGGTAT TGATAATCCT GATATGAATA AATTGCAGTT 3421 TCATTTGATG CTCGATGAGT TTTTCTAATC AGAATTGGTT AATTGGTTGT AACACTGGCA 3481 GAGCATTACG CTGACTTGAC GGGACGGCGC AAGCTCATGA CCAAAATCCC TTAACGTGAG 3541 TTACGCGTCG TTCCACTGAG CGTCAGACCC CGTAGAAAAG ATCAAAGGAT CTTCTTGAGA 3601 TCCTTTTTTT CTGCGCGTAA TCTGCTGCTT GCAAACAAAA AAACCACCGC TACCAGCGGT 3661 GGTTTGTTTG CCGGATCAAG AGCTACCAAC TCTTTTTCCG AAGGTAACTG GCTTCAGCAG 3721 AGCGCAGATA CCAAATACTG TTCTTCTAGT GTAGCCGTAG TTAGGCCACC ACTTCAAGAA 3781 CTCTGTAGCA CCGCCTACAT ACCTCGCTCT GCTAATCCTG TTACCAGTGG CTGCTGCCAG 3841 TGGCGATAAG TCGTGTCTTA CCGGGTTGGA CTCAAGACGA TAGTTACCGG ATAAGGCGCA 3901 GCGGTCGGGC TGAACGGGGG GTTCGTGCAC ACAGCCCAGC TTGGAGCGAA CGACCTACAC 3961 CGAACTGAGA TACCTACAGC GTGAGCTATG AGAAAGCGCC ACGCTTCCCG AAGGGAGAAA 4021 GGCGGACAGG TATCCGGTAA GCGGCAGGGT CGGAACAGGA GAGCGCACGA GGGAGCTTCC 4081 AGGGGGAAAC GCCTGGTATC TTTATAGTCC TGTCGGGTTT CGCCACCTCT GACTTGAGCG 4141 TCGATTTTTG TGATGCTCGT CAGGGGGGCG GAGCCTATGG AAAAACGCCA GCAACGCGGC 4201 CTTTTTACGG TTCCTGGCCT TTTGCTGGCC TTTTGCTCAC ATGTT //